# 对元数据进行筛选
# 去掉了一些列

import pandas as pd

inputfile = r"..\data\microwave.tsv"  # 评论汇总文件
outputfile2 = r"..\data\microwave_1selected.tsv" # 筛选列后的数据

data = pd.read_csv(inputfile, sep='\t', encoding='utf-8')
print(data.columns)
data = data.drop(['marketplace', 'product_category'], axis=1)  # 剔除了两列
# print(data.head(5))
data.to_csv(outputfile2, sep='\t')
